# -*- coding:utf-8 -*-

from wordcloud import WordCloud, STOPWORDS
import pandas as pd
import jieba
import matplotlib.pyplot as plt
# import seaborn as sns
from pyecharts import Geo, Style, Line, Bar, Overlap


f = open('out2/爱情公寓_new.txt', encoding='utf-8')
data = pd.read_csv(f, sep=',', header=None, encoding='utf-8', names=['date', 'nickname', 'city', 'rate', 'comment'])

city = data.groupby(['city'])
rate_group = city['rate']
city_com = city['rate'].agg(['mean', 'count'])
# print(city_com)
city_com.reset_index(inplace=True)
city_com['mean'] = round(city_com['mean'], 2)

# 热力图分析
data_map = [(city_com['city'][i], city_com['count'][i]) for i in range(0, city_com.shape[0])]
# print(data_map)
style = Style(title_color="#fff", title_pos="center",
              width=1200, height=600, background_color="#404a59")

geo = Geo("《爱情公寓》粉丝人群地理位置", "数据来源：猫眼影评", **style.init_style)

while True:
    try:
        attr, val = geo.cast(data_map)
        geo.add("", attr, val, visual_range=[0, 20],
                visual_text_color="#fff", symbol_size=20,
                is_visualmap=True, is_piecewise=True,
                visual_split_number=4)
    except ValueError as e:
        e = str(e)
        e = e.split("No coordinate is specified for ")[1]  # 获取不支持的城市名
        for i in range(0, len(data_map)):
            if e in data_map[i]:
                data_map.pop(i)
                break

    else:
        break
geo.render('out2/爱情公寓-热力图分析.html')

# 折线+柱图分析
city_main = city_com.sort_values('count', ascending=False)[0:20]
# print(city_main)
attr = city_main['city']
v1 = city_main['count']
v2 = city_main['mean']
# print(attr,v1,v2)
line = Line("主要城市评分")
line.add("评分", attr, v2, is_stack=True, xaxis_rotate=30, yaxix_min=4.2,
         mark_point=['min', 'max'], xaxis_interval=0, line_color='lightblue',
         line_width=4, mark_point_textcolor='black', mark_point_color='lightblue',
         is_splitline_show=False)

bar = Bar("主要城市评论数")
bar.add("评论数", attr, v1, is_stack=True, xaxis_rotate=30, yaxix_min=4.2,
        xaxis_interval=0, is_splitline_show=False)

overlap = Overlap()
overlap.add(bar)
overlap.add(line, yaxis_index=1, is_add_yaxis=True)
overlap.render('out2/爱情公寓-主要城市评论数-平均分.html')

# 词云分析
# 分词
comment = jieba.cut(str(data['comment']), cut_all=False)
wl_space_split = " ".join(comment)

# 导入背景图
backgroud_Image = plt.imread('sources/background.jpg')
stopwords = STOPWORDS.copy()
# print("STOPWORDS.copy()",help(STOPWORDS.copy()))


wc = WordCloud(width=1024, height=768, background_color='white',
               mask=backgroud_Image, font_path="sources/于洪亮硬笔行楷.ttf",
               stopwords=stopwords, max_font_size=400,
               random_state=50)

wc.generate_from_text(wl_space_split)
plt.imshow(wc)
plt.axis('off')  # 不显示坐标轴
plt.show()
wc.to_file(r'out2/爱情公寓-词云分析.jpg')
